This is where the final project report write-up goes.

Before you submit, make sure everything runs as expected.

You can add sections as you see fit. Make sure you have a section called “Introduction” at the beginning and a section called “Conclusion” at the end. The rest is up to you!

##Introduction - Load the tidyverse, ggplot, and rtweet packages

library(tidyverse)
library(ggplot2)
library(rtweet)
library(readr)

This data set was scraped from WineEnthusiast, a website that reviews and rates many differet types of wines.

wines <- read.csv(file = '../data/winemag-data-130k-v2.csv')[,-1]
set.seed(19630217)
wine_sample<- sample_n(wines, 1000)

EDA (correlation priceXpoints, with DataExplorer library? using (this)[https://datascienceplus.com/blazing-fast-eda-in-r-with-dataexplorer/])

wines %>% 
  ggplot() +
    geom_point(mapping = (aes(x = points, y = price)), na.rm = T)
wines %>%
    summarize(mean(price, na.rm=TRUE), 
              min(price, na.rm=TRUE),
              max(price,na.rm=TRUE), 
              sd(price, na.rm=TRUE))
wines %>%
    summarize(mean(points, na.rm=TRUE), 
              min(points, na.rm=TRUE),
              max(points,na.rm=TRUE), 
              sd(points, na.rm=TRUE))

Select the provinces based on points and Select the best province for wine based on the average points of the sample size.

#find the average number of points across the 1,000 samples

wine_per_province <- wine_sample %>% 
  select(province, points) %>% 
  summarise(points = mean(points))
wine_per_province

#Find the best province for wine using the average points across the 1,000 samples #drop the descriptions or just select price? set points to max(points)

best_province <- wine_sample %>% 
  group_by(province, points) %>% 
  filter(points > 88.669)
best_province  

Rating distribution

Best wine, by variety

#sort by price, then points
#want to do an interaction variableor somethin?
#wine_cheap_but_good <- 
wines %>% 
  group_by(variety) %>% 
  summarise(mean_points = mean(points)) %>% 
  arrange(desc(mean_points)) 
NA
NA
user_price <- readline(prompt = "How much are you willing to spend on a bottle?")
17
user_price <- as.integer(user_price)

#best_cheap_wine <-
wines %>% 
  filter(price <= user_price) %>% 
  arrange(desc(points)) %>% 
  select(title, price, points)

##Conclusion

LS0tDQp0aXRsZTogIkZpbmFsIFJlcG9ydCBmb3IgSW50cm8gdG8gRGF0YSBTY2llbmNlIg0Kb3V0cHV0OiBodG1sX25vdGVib29rDQotLS0NClRoaXMgaXMgd2hlcmUgdGhlIGZpbmFsIHByb2plY3QgcmVwb3J0IHdyaXRlLXVwIGdvZXMuIA0KDQpCZWZvcmUgeW91IHN1Ym1pdCwgbWFrZSBzdXJlIGV2ZXJ5dGhpbmcgcnVucyBhcyBleHBlY3RlZC4NCg0KWW91IGNhbiBhZGQgc2VjdGlvbnMgYXMgeW91IHNlZSBmaXQuIE1ha2Ugc3VyZSB5b3UgaGF2ZSBhIHNlY3Rpb24gY2FsbGVkICJJbnRyb2R1Y3Rpb24iIGF0IHRoZSBiZWdpbm5pbmcgYW5kIGEgc2VjdGlvbiBjYWxsZWQgIkNvbmNsdXNpb24iIGF0IHRoZSBlbmQuIFRoZSByZXN0IGlzIHVwIHRvIHlvdSENCg0KDQoNCiMjSW50cm9kdWN0aW9uDQotIExvYWQgdGhlIGB0aWR5dmVyc2UsIGdncGxvdCwgYW5kIHJ0d2VldGAgcGFja2FnZXMNCmBgYHtyLCBtZXNzYWdlPUZBTFNFLCB3YXJuaW5nPUZBTFNFfQ0KbGlicmFyeSh0aWR5dmVyc2UpDQpsaWJyYXJ5KGdncGxvdDIpDQpsaWJyYXJ5KHJ0d2VldCkNCmxpYnJhcnkocmVhZHIpDQpgYGANCg0KDQpUaGlzIGRhdGEgc2V0IHdhcyBzY3JhcGVkIGZyb20gV2luZUVudGh1c2lhc3QsIGEgd2Vic2l0ZSB0aGF0IHJldmlld3MgYW5kIHJhdGVzIG1hbnkgZGlmZmVyZXQgdHlwZXMgb2Ygd2luZXMuICANCg0KLSBUaGlzIGRhdGFzZXQgaW5jbHVkZXMgaW5mb3JtYXRpb24gb2Ygb2YgMTMwLDAwMCB3aW5lIHJldmlld3Mgd2l0aCAxMCBkaWZmZXJlbnQgZGF0YSBmaWVsZHMuIA0KICANCg0KYGBge3J9DQp3aW5lcyA8LSByZWFkLmNzdihmaWxlID0gJy4uL2RhdGEvd2luZW1hZy1kYXRhLTEzMGstdjIuY3N2JylbLC0xXQ0KYGBgDQoNCmBgYHtyfQ0Kc2V0LnNlZWQoMTk2MzAyMTcpDQp3aW5lX3NhbXBsZTwtIHNhbXBsZV9uKHdpbmVzLCAxMDAwKQ0KYGBgDQoNCkVEQSAoY29ycmVsYXRpb24gcHJpY2VYcG9pbnRzLCB3aXRoIGBgYERhdGFFeHBsb3JlcmBgYCBsaWJyYXJ5PyB1c2luZyAodGhpcylbaHR0cHM6Ly9kYXRhc2NpZW5jZXBsdXMuY29tL2JsYXppbmctZmFzdC1lZGEtaW4tci13aXRoLWRhdGFleHBsb3Jlci9dKQ0KYGBge3J9DQp3aW5lcyAlPiUgDQogIGdncGxvdCgpICsNCiAgICBnZW9tX3BvaW50KG1hcHBpbmcgPSAoYWVzKHggPSBwb2ludHMsIHkgPSBwcmljZSkpLCBuYS5ybSA9IFQpDQpgYGANCg0KYGBge3J9DQp3aW5lcyAlPiUNCiAgICBzdW1tYXJpemUobWVhbihwcmljZSwgbmEucm09VFJVRSksIA0KICAgICAgICAgICAgICBtaW4ocHJpY2UsIG5hLnJtPVRSVUUpLA0KICAgICAgICAgICAgICBtYXgocHJpY2UsbmEucm09VFJVRSksIA0KICAgICAgICAgICAgICBzZChwcmljZSwgbmEucm09VFJVRSkpDQpgYGANCg0KYGBge3J9DQp3aW5lcyAlPiUNCiAgICBzdW1tYXJpemUobWVhbihwb2ludHMsIG5hLnJtPVRSVUUpLCANCiAgICAgICAgICAgICAgbWluKHBvaW50cywgbmEucm09VFJVRSksDQogICAgICAgICAgICAgIG1heChwb2ludHMsbmEucm09VFJVRSksIA0KICAgICAgICAgICAgICBzZChwb2ludHMsIG5hLnJtPVRSVUUpKQ0KYGBgDQoNClNlbGVjdCB0aGUgcHJvdmluY2VzIGJhc2VkIG9uIHBvaW50cyAgYW5kIFNlbGVjdCB0aGUgYmVzdCBwcm92aW5jZSBmb3Igd2luZSBiYXNlZCBvbiB0aGUgYXZlcmFnZSBwb2ludHMgb2YgdGhlIHNhbXBsZSBzaXplLiANCg0KI2ZpbmQgdGhlIGF2ZXJhZ2UgbnVtYmVyIG9mIHBvaW50cyBhY3Jvc3MgdGhlIDEsMDAwIHNhbXBsZXMNCmBgYHtyfQ0Kd2luZV9wZXJfcHJvdmluY2UgPC0gd2luZV9zYW1wbGUgJT4lIA0KICBzZWxlY3QocHJvdmluY2UsIHBvaW50cykgJT4lIA0KICBzdW1tYXJpc2UocG9pbnRzID0gbWVhbihwb2ludHMpKQ0Kd2luZV9wZXJfcHJvdmluY2UNCmBgYA0KDQoNCiNGaW5kIHRoZSBiZXN0IHByb3ZpbmNlIGZvciB3aW5lIHVzaW5nIHRoZSBhdmVyYWdlIHBvaW50cyBhY3Jvc3MgdGhlIDEsMDAwIHNhbXBsZXMNCiNkcm9wIHRoZSBkZXNjcmlwdGlvbnMgb3IganVzdCBzZWxlY3QgcHJpY2U/IHNldCBwb2ludHMgdG8gbWF4KHBvaW50cykNCmBgYHtyfQ0KYmVzdF9wcm92aW5jZSA8LSB3aW5lX3NhbXBsZSAlPiUgDQogIGdyb3VwX2J5KHByb3ZpbmNlLCBwb2ludHMpICU+JSANCiAgZmlsdGVyKHBvaW50cyA+IDg4LjY2OSkNCmJlc3RfcHJvdmluY2UgIA0KYGBgDQoNCg0KUmF0aW5nIGRpc3RyaWJ1dGlvbg0KDQpgYGB7cn0NCg0KYGBgDQoNCkJlc3Qgd2luZSwgYnkgdmFyaWV0eQ0KYGBge3J9DQojd2luZV9iZXN0X3ZhcmlldHkgPC0gDQp3aW5lcyAlPiUgDQogIGdyb3VwX2J5KHZhcmlldHkpICU+JSANCiAgc3VtbWFyaXNlKG1lYW5fcG9pbnRzID0gbWVhbihwb2ludHMpKSAlPiUgDQogIGFycmFuZ2UoZGVzYyhtZWFuX3BvaW50cykpIA0KICANCmBgYA0KDQpgYGB7cn0NCnVzZXJfcHJpY2UgPC0gcmVhZGxpbmUocHJvbXB0ID0gIkhvdyBtdWNoIGFyZSB5b3Ugd2lsbGluZyB0byBzcGVuZCBvbiBhIGJvdHRsZT8iKQ0KdXNlcl9wcmljZSA8LSBhcy5pbnRlZ2VyKHVzZXJfcHJpY2UpDQoNCndpbmVzICU+JSANCiAgZmlsdGVyKHByaWNlIDw9IHVzZXJfcHJpY2UpICU+JSANCiAgYXJyYW5nZShkZXNjKHBvaW50cykpICU+JSANCiAgc2VsZWN0KHRpdGxlLCBwcmljZSwgcG9pbnRzKQ0KYGBgDQoNCg0KDQojI0NvbmNsdXNpb24NCg==